"""第 0008 题：一个 HTML 文件，找出里面的正文。"""
from bs4 import BeautifulSoup


def get_html_content(html):
    """获取 HTML 文件正文"""
    with open(html, encoding='utf-8') as f:
        content = f.read()

    soup = BeautifulSoup(content, 'lxml')
    content = soup.find('div', id="readme").get_text()
    return content


print(get_html_content('test.html'))
